@article{pyslamSemantic2025,
  title={Semantic pySLAM: Unifying semantic mapping
approaches under the same framework},
  author={Morilla-Cabello, David and Montijano, Eduardo},
  journal={RSS 2025 Workshop, Unifying Visual SLAM},
  year={2025}
}

@inproceedings{lin2023clip,
  title={Clip is also an efficient segmenter: A text-driven approach for weakly supervised semantic segmentation},
  author={Lin, Yuqi and Chen, Minghao and Wang, Wenxiao and Wu, Boxi and Li, Ke and Lin, Binbin and Liu, Haifeng and He, Xiaofei},
  booktitle={Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition},
  pages={15305--15314},
  year={2023}
}

@article{xie2021segformer,
  title={SegFormer: Simple and efficient design for semantic segmentation with transformers},
  author={Xie, Enze and Wang, Wenhai and Yu, Zhiding and Anandkumar, Anima and Alvarez, Jose M and Luo, Ping},
  journal={Advances in neural information processing systems},
  volume={34},
  pages={12077--12090},
  year={2021}
}

@article{chen2017rethinking,
  title={Rethinking atrous convolution for semantic image segmentation},
  author={Chen, Liang-Chieh and Papandreou, George and Schroff, Florian and Adam, Hartwig},
  journal={arXiv preprint arXiv:1706.05587},
  year={2017}
}

@article{kerbl20233d,
  title={3d gaussian splatting for real-time radiance field rendering.},
  author={Kerbl, Bernhard and Kopanas, Georgios and Leimk{\"u}hler, Thomas and Drettakis, George},
  journal={ACM Trans. Graph.},
  volume={42},
  number={4},
  pages={139--1},
  year={2023}
}

@article{matsuki2023gaussian,
  title={Gaussian splatting slam. arXiv},
  author={Matsuki, H and Murai, R and Kelly, PH and Davison, AJ},
  journal={arXiv preprint arXiv:2312.06741},
  year={2023}
}

@article{dong2022ash,
  title={ASH: A modern framework for parallel spatial hashing in 3D perception},
  author={Dong, Wei and Lao, Yixing and Kaess, Michael and Koltun, Vladlen},
  journal={IEEE transactions on pattern analysis and machine intelligence},
  volume={45},
  number={5},
  pages={5417--5435},
  year={2022},
  publisher={IEEE}
}

@INPROCEEDINGS{PTAM,
  author={Klein, Georg and Murray, David},
  booktitle={2007 6th IEEE and ACM International Symposium on Mixed and Augmented Reality}, 
  title={Parallel Tracking and Mapping for Small AR Workspaces}, 
  year={2007},
  volume={},
  number={},
  pages={225-234},
  keywords={Robot vision systems;Cameras;Tracking;Yarn;Robustness;Layout;Simultaneous localization and mapping;Algorithm design and analysis;Concurrent computing;Handheld computers},
  doi={10.1109/ISMAR.2007.4538852}}
  
@article{rosten2006machine,
  title={Machine learning for high-speed corner detection},
  author={Rosten, Edward and Drummond, Tom},
  journal={European conference on computer vision},
  pages={430--443},
  year={2006},
  organization={Springer}
}

@article{shi1994good,
  title={Good features to track},
  author={Shi, Jianbo and Tomasi, Carlo},
  journal={1994 Proceedings of IEEE conference on computer vision and pattern recognition},
  pages={593--600},
  year={1994},
  organization={IEEE}
}

@article{rublee2011orb,
  title={ORB: An efficient alternative to SIFT or SURF},
  author={Rublee, Ethan and Rabaud, Vincent and Konolige, Kurt and Bradski, Gary},
  journal={2011 International conference on computer vision},
  pages={2564--2571},
  year={2011},
  organization={IEEE}
}

@article{lowe1999object,
  title={Object recognition from local scale-invariant features},
  author={Lowe, David G},
  journal={Proceedings of the seventh IEEE international conference on computer vision},
  volume={2},
  pages={1150--1157},
  year={1999},
  organization={Ieee}
}

@article{bay2006surf,
  title={SURF: Speeded up robust features},
  author={Bay, Herbert and Tuytelaars, Tinne and Van Gool, Luc},
  journal={European conference on computer vision},
  pages={404--417},
  year={2006},
  organization={Springer}
}

@article{alcantarilla2012kaze,
  title={KAZE features},
  author={Alcantarilla, Pablo F and Bartoli, Adrien and Davison, Andrew J},
  journal={European conference on computer vision},
  pages={214--227},
  year={2012},
  organization={Springer}
}

@article{alcantarilla2013fast,
  title={Fast explicit diffusion for accelerated features in nonlinear scale spaces},
  author={Alcantarilla, Pablo F and Nuevo, Jesús and Bartoli, Adrien},
  journal={IEEE transactions on pattern analysis and machine intelligence},
  volume={34},
  number={7},
  pages={1281--1298},
  year={2013},
  publisher={IEEE}
}

@article{leutenegger2011brisk,
  title={BRISK: Binary robust invariant scalable keypoints},
  author={Leutenegger, Stefan and Chli, Margarita and Siegwart, Roland Y},
  journal={2011 International conference on computer vision},
  pages={2548--2555},
  year={2011},
  organization={IEEE}
}

@article{matas2002robust,
  title={Robust wide-baseline stereo from maximally stable extremal regions},
  author={Matas, Jiri and Chum, Ondrej and Urban, Martin and Pajdla, Tomas},
  journal={Proceedings of the British Machine Vision Conference},
  volume={1},
  number={502},
  pages={384--393},
  year={2002},
  organization={BMVA Press}
}

@article{trzcinski2013boosting,
  title={Boosting binary keypoint descriptors},
  author={Trzcinski, Tomasz and Christoudias, Marios and Fua, Pascal and Lepetit, Vincent},
  journal={2013 IEEE Conference on Computer Vision and Pattern Recognition},
  pages={2874--2881},
  year={2013},
  organization={IEEE}
}

@article{tola2010daisy,
  title={Daisy: An efficient dense descriptor applied to wide-baseline stereo},
  author={Tola, Engin and Lepetit, Vincent and Fua, Pascal},
  journal={IEEE transactions on pattern analysis and machine intelligence},
  volume={32},
  number={5},
  pages={815--830},
  year={2010},
  publisher={IEEE}
}

@article{levi2006latch,
  title={The LATCH descriptor: Local binary patterns for image matching},
  author={Levi, Gil and Hassner, Tal and Basri, Ronen},
  journal={IEEE transactions on pattern analysis and machine intelligence},
  volume={38},
  number={8},
  pages={1622--1634},
  year={2016},
  publisher={IEEE}
}

@article{simonyan2014learning,
  title={Learning local feature descriptors using convex optimisation},
  author={Simonyan, Karen and Vedaldi, Andrea and Zisserman, Andrew},
  journal={IEEE transactions on pattern analysis and machine intelligence},
  volume={36},
  number={8},
  pages={1573--1585},
  year={2014},
  publisher={IEEE}
}

@article{mishchuk2017working,
  title={Working hard to know your neighbor's margins: Local descriptor learning loss},
  author={Mishchuk, Anastasiia and Mishkin, Dmytro and Radenovic, Filip and Matas, Jiri},
  journal={Advances in neural information processing systems},
  volume={30},
  year={2017}
}

@article{verdie2018tilde,
  title={TILDE: A temporally invariant learned detector},
  author={Verdie, Yannick and Yi, Kwang Moo and Fua, Pascal and Lepetit, Vincent},
  journal={Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition},
  pages={5279--5288},
  year={2015}
}

@article{dusmanu2019d2,
  title={D2-net: A trainable CNN for joint description and detection of local features},
  author={Dusmanu, Mihai and Rocco, Ignacio and Pajdla, Tomas and Pollefeys, Marc and Sivic, Josef and Torii, Akihiko and Sattler, Torsten},
  journal={Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition},
  pages={8092--8101},
  year={2019}
}

@article{noh2017large,
  title={Large-scale image retrieval with attentive deep local features},
  author={Noh, Hyeonwoo and Araujo, Andre and Sim, Joonseok and Weyand, Tobias and Han, Bohyung},
  journal={Proceedings of the IEEE international conference on computer vision},
  pages={3456--3465},
  year={2017}
}

@article{luo2020contextdesc,
  title={Contextdesc: Local descriptor augmentation with cross-modality context},
  author={Luo, Zixin and Zhou, Lei and Bai, Xiang and Yuille, Alan and Ren, Jimmy},
  journal={Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition},
  pages={2527--2536},
  year={2020}
}

@article{ono2018lf,
  title={LF-Net: Learning local features from images},
  author={Ono, Yoshitaka and Trulls, Eduard and Fua, Pascal and Yi, Kwang Moo},
  journal={Advances in neural information processing systems},
  volume={31},
  year={2018}
}

@article{revaud2019r2d2,
  title={R2d2: Repeatable and reliable detector and descriptor},
  author={Revaud, Jerome and Weinzaepfel, Philippe and De Souza, Cedric R and Pion, Nicolas and Csurka, Gabriela and Cabon, Yohann and Humenberger, Martin},
  journal={Advances in neural information processing systems},
  volume={32},
  year={2019}
}

@article{barroso2020key,
  title={Key.Net: Keypoint detection by handcrafted and learned CNN filters},
  author={Barroso-Laguna, Axel and Riba, Edgar and Ponsa, Daniel and Mikolajczyk, Krystian},
  journal={Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition},
  pages={5836--5844},
  year={2020},
  url = {https://github.com/axelBarroso/Key.Net}
}

@article{tyszkiewicz2020disk,
  title={DISK: Learning local features with policy gradient},
  author={Tyszkiewicz, Maciej and Fua, Pascal and Trulls, Eduard},
  journal={Advances in neural information processing systems},
  volume={33},
  pages={14254--14265},
  year={2020}
}

@article{barroso2023alike,
  title={ALIKED: A lightweight keypoint detector and descriptor},
  author={Barroso-Laguna, Axel and Riba, Edgar and Ponsa, Daniel and Mikolajczyk, Krystian},
  journal={arXiv preprint arXiv:2304.03608},
  year={2023}
}

@article{barroso2024xfeat,
  title={Xfeat: A new feature detector and descriptor},
  author={Barroso-Laguna, Axel and Riba, Edgar and Ponsa, Daniel and Mikolajczyk, Krystian},
  journal={arXiv preprint arXiv:2404.19174},
  year={2024}
}

@article{galvez2012bags,
  title={Bags of binary words for fast place recognition in image sequences},
  author={Galvez-Lopez, Dorian and Tardos, Juan D},
  journal={IEEE Transactions on Robotics},
  volume={28},
  number={5},
  pages={1188--1197},
  year={2012},
  publisher={IEEE}
}

@article{muja2009fast,
  title={Fast approximate nearest neighbors with automatic algorithm configuration},
  author={Muja, Marius and Lowe, David G},
  journal={VISAPP (1)},
  volume={2},
  number={331-340},
  pages={2},
  year={2009}
}

@article{neubert2021hyperdimensional,
  title={Hyperdimensional computing as a framework for systematic aggregation of image descriptors},
  author={Neubert, Peer and Protzel, Peter},
  journal={Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition},
  pages={9067--9076},
  year={2021}
}

@article{arandjelovic2016netvlad,
  title={NetVLAD: CNN architecture for weakly supervised place recognition},
  author={Arandjelovic, Relja and Gronat, Petr and Torii, Akihiko and Pajdla, Tomas and Sivic, Josef},
  journal={Proceedings of the IEEE conference on computer vision and pattern recognition},
  pages={5297--5307},
  year={2016}
}

@article{berton2023cosplace,
  title={CosPlace: Efficient place recognition with cosine similarity},
  author={Berton, Gabriele and Masone, Carlo and Caputo, Barbara},
  journal={arXiv preprint arXiv:2304.03608},
  year={2023}
}

@article{berton2023eigenplaces,
  title={EigenPlaces: Learning place recognition with eigenvectors},
  author={Berton, Gabriele and Masone, Carlo and Caputo, Barbara},
  journal={arXiv preprint arXiv:2404.19174},
  year={2023}
}

@article{berton2025megaloc,
  title={Megaloc: One retrieval to place them all},
  author={Berton, Gabriele and Masone, Carlo},
  journal={arXiv preprint arXiv:2502.17237},
  year={2025}
}

@article{hirschmuller2007stereo,
  title={Stereo processing by semiglobal matching and mutual information},
  author={Hirschmuller, Heiko},
  journal={IEEE Transactions on pattern analysis and machine intelligence},
  volume={30},
  number={2},
  pages={328--341},
  year={2007},
  publisher={IEEE}
}

@article{depthpro2023,
  title={Depth pro: Sharp monocular metric depth in less than a second},
  author={Bochkovskii, Aleksei and Delaunoy, Ama{\"e}l and Germain, Hugo and Santos, Marcel and Zhou, Yichao and Richter, Stephan R and Koltun, Vladlen},
  journal={arXiv preprint arXiv:2410.02073},
  year={2024},
  url = {https://github.com/apple/ml-depth-pro}
}

@article{depthanythingv2_2024,
  title={DepthAnythingV2: A monocular depth prediction model},
  author={DepthAnything Team},
  journal={arXiv preprint arXiv:2406.09414},
  year={2024}
}

@article{teed2021raft,
  title={RAFT-Stereo: Recurrent all-pairs field transforms for stereo matching},
  author={Teed, Zachary and Deng, Jia},
  journal={arXiv preprint arXiv:2109.07547},
  year={2021}
}

@article{li2022cres,
  title={CREStereo: Cross-scale cost aggregation for stereo matching},
  author={Li, Zhengfa and Liu, Yuhua and Shen, Tianwei and Chen, Shuaicheng and Fang, Lu and Quan, Long},
  journal={arXiv preprint arXiv:2203.11483},
  year={2022}
}

@article{zollhofer2018state,
  title={State of the art on 3D reconstruction with RGB-D cameras},
  author={Zollhöfer, Michael and Martinek, Martin and Stückler, Jörg and Klein, Reinhard and Wetzstein, Gordon and Nießner, Matthias},
  journal={Computer Graphics Forum},
  volume={37},
  number={2},
  pages={625--652},
  year={2018},
  publisher={Wiley Online Library}
}

@misc{ORB_SLAM2,
  author = {Raul Mur-Artal and Juan D. Tardos},
  title = {ORB-SLAM2: An Open-Source SLAM System for Monocular, Stereo and RGB-D Cameras},
  year = {2017},
  url = {https://github.com/raulmur/ORB_SLAM2}
}

@misc{learnopencv,
  author = {Satya Mallick},
  title = {Camera Calibration using OpenCV},
  year = {2016},
  url = {https://learnopencv.com/camera-calibration-using-opencv/}
}

@misc{opencv,
  author = {OpenCV},
  title = {Camera Calibration},
  year = {2021},
  url = {https://docs.opencv.org/4.x/dc/dbb/tutorial_py_calibration.html}
}

@misc{Pangolin,
  author = {Steven Lovegrove},
  title = {Pangolin: Lightweight Portable Rapid Development Library for Managing OpenGL Display / Interaction and Abstracting Context},
  year = {2017},
  url = {https://github.com/stevenlovegrove/Pangolin}
}

@misc{g2opy,
  author = {uoip},
  title = {g2opy: Python bindings for g2o},
  year = {2018},
  url = {https://github.com/uoip/g2opy}
}

@inproceedings{detone18superpoint,
  author    = {Daniel DeTone and
               Tomasz Malisiewicz and
               Andrew Rabinovich},
  title     = {SuperPoint: Self-Supervised Interest Point Detection and Description},
  booktitle = {CVPR Deep Learning for Visual SLAM Workshop},
  year      = {2018},
  url       = {http://arxiv.org/abs/1712.07629}
}

@inproceedings{Tfeat,
  title={Learning local feature descriptors with triplets and shallow convolutional neural networks.},
  author={Balntas, Vassileios and Riba, Edgar and Ponsa, Daniel and Mikolajczyk, Krystian},
  booktitle={Bmvc},
  volume={1},
  number={2},
  pages={3},
  year={2016}
}\\

@misc{ImageMatchingBenchmarkBaselines,
  author = {vcg-uvic},
  title = {Image Matching Benchmark Baselines},
  year = {2020},
  url = {https://github.com/vcg-uvic/image-matching-benchmark-baselines}
}

@inproceedings{Hardnet,
 author = {Anastasiya Mishchuk and Dmytro Mishkin and Filip Radenovic and Jiri Matas},
 title = "{Working hard to know your neighbor's margins: Local descriptor learning loss}",
 booktitle = {Proceedings of NeurIPS},
 year = 2017,
 month = dec,
 url = {https://github.com/DagnyT/hardnet.git} 
}

@inproceedings{GeoDesc,
  title={Geodesc: Learning local descriptors by integrating geometry constraints},
  author={Luo, Zixin and Shen, Tianwei and Zhou, Lei and Zhu, Siyu and Zhang, Runze and Yao, Yao and Fang, Tian and Quan, Long},
  booktitle={Proceedings of the European conference on computer vision (ECCV)},
  pages={168--183},
  year={2018},
  url = {https://github.com/lzx551402/geodesc.git}  
}

@inproceedings{SOSNet,
  title={Sosnet: Second order similarity regularization for local descriptor learning},
  author={Tian, Yurun and Yu, Xin and Fan, Bin and Wu, Fuchao and Heijnen, Huub and Balntas, Vassileios},
  booktitle={Proceedings of the IEEE/CVF conference on computer vision and pattern recognition},
  pages={11016--11025},
  year={2019},
  url = {https://github.com/yuruntian/SOSNet.git}  
}

@inproceedings{L2Net,
  title={L2-net: Deep learning of discriminative patch descriptor in euclidean space},
  author={Tian, Yurun and Fan, Bin and Wu, Fuchao},
  booktitle={Proceedings of the IEEE conference on computer vision and pattern recognition},
  pages={661--669},
  year={2017},
  url = {https://github.com/yuruntian/L2-Net}
}

@article{LogPolarDescriptor,
   author = {Patrick Ebel and Anastasiia Mishchuk and Kwang Moo Yi and Pascal Fua and Eduard Trulls},
   title = {{Beyond Cartesian Representations for Local Descriptors}},
   booktitle = {Proc. of ICCV},
   year = 2019,
   url = {https://github.com/cvlab-epfl/log-polar-descriptors}
}


@InProceedings{D2Net,
    author = {Dusmanu, Mihai and Rocco, Ignacio and Pajdla, Tomas and Pollefeys, Marc and Sivic, Josef and Torii, Akihiko and Sattler, Torsten},
    title = {{D2-Net: A Trainable CNN for Joint Detection and Description of Local Features}},
    booktitle = {Proceedings of the 2019 IEEE/CVF Conference on Computer Vision and Pattern Recognition},
    year = {2019},
    url = {https://github.com/mihaidusmanu/d2-net}    
}

@inproceedings{DELF,
  title={Large-scale image retrieval with attentive deep local features},
  author={Noh, Hyeonwoo and Araujo, Andre and Sim, Jack and Weyand, Tobias and Han, Bohyung},
  booktitle={Proceedings of the IEEE international conference on computer vision},
  pages={3456--3465},
  year={2017}
}

@article{Contextdesc,
  title={ContextDesc: Local Descriptor Augmentation with Cross-Modality Context},
  author={Luo, Zixin and Shen, Tianwei and Zhou, Lei and Zhang, Jiahui and Yao, Yao and Li, Shiwei and Fang, Tian and Quan, Long},
  journal={Computer Vision and Pattern Recognition (CVPR)},
  year={2019},
  url = {https://github.com/lzx551402/contextdesc}  
}

@article{LFNet,
  title={LF-Net: Learning local features from images},
  author={Ono, Yuki and Trulls, Eduard and Fua, Pascal and Yi, Kwang Moo},
  journal={Advances in neural information processing systems},
  volume={31},
  year={2018},
  url = {https://github.com/vcg-uvic/lf-net-release}  
}

@inproceedings{R2D2,
  author    = {Jerome Revaud and Philippe Weinzaepfel and C{\'{e}}sar Roberto de Souza and
               Martin Humenberger},
  title     = {{R2D2:} Repeatable and Reliable Detector and Descriptor},
  booktitle = {NeurIPS},
  year      = {2019},
  url = {https://github.com/naver/r2d2}  
}

@article{BEBLID,
  title={BEBLID: Boosted efficient binary local image descriptor},
  author={Su{\'a}rez, Iago and Sfeir, Ghesn and Buenaposada, Jos{\'e} M and Baumela, Luis},
  journal={Pattern recognition letters},
  volume={133},
  pages={366--372},
  year={2020},
  publisher={Elsevier}
}

@article{DISK,
  title={DISK: Learning local features with policy gradient},
  author={Tyszkiewicz, Micha{\l} and Fua, Pascal and Trulls, Eduard},
  journal={Advances in Neural Information Processing Systems},
  volume={33},
  pages={14254--14265},
  year={2020},
  url = {https://arxiv.org/abs/2006.13566}  
}

@inproceedings{Xfeat,
  title={XFeat: Accelerated Features for Lightweight Image Matching},
  author={Potje, Guilherme and Cadar, Felipe and Araujo, Andr{\'e} and Martins, Renato and Nascimento, Erickson R},
  booktitle={Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition},
  pages={2682--2691},
  year={2024},
  url = {https://arxiv.org/abs/2404.19174}
}

@inproceedings{LightGlue,
  title={Lightglue: Local feature matching at light speed},
  author={Lindenberger, Philipp and Sarlin, Paul-Edouard and Pollefeys, Marc},
  booktitle={Proceedings of the IEEE/CVF International Conference on Computer Vision},
  pages={17627--17638},
  year={2023},
  url = {https://arxiv.org/abs/2306.13643}
}

@article{VPR_Tutorial,
  title={Visual Place Recognition: A Tutorial},
  author={Schubert, Stefan and Neubert, Peer and Garg, Sourav and Milford, Michael and Fischer, Tobias},
  journal={IEEE Robotics \& Automation Magazine},  
  year={2023},
  doi={10.1109/MRA.2023.3310859},
  url = {https://github.com/stschubert/VPR_Tutorial.git}  
}

@article{DepthAnythingV2,
  title={Depth Anything V2},
  author={Yang, Lihe and Kang, Bingyi and Huang, Zilong and Zhao, Zhen and Xu, Xiaogang and Feng, Jiashi and Zhao, Hengshuang},
  journal={arXiv:2406.09414},
  year={2024},
  url = {https://github.com/DepthAnything/Depth-Anything-V2}  
}

@inproceedings{RAFTStereo,
  title={RAFT-Stereo: Multilevel Recurrent Field Transforms for Stereo Matching},
  author={Lipson, Lahav and Teed, Zachary and Deng, Jia},
  booktitle={International Conference on 3D Vision (3DV)},
  year={2021},
  url = {https://github.com/princeton-vl/RAFT-Stereo}  
}

@inproceedings{CREStereo,
  title={Practical stereo matching via cascaded recurrent network with adaptive correlation},
  author={Li, Jiankun and Wang, Peisen and Xiong, Pengfei and Cai, Tao and Yan, Ziwei and Yang, Lei and Liu, Jiangyu and Fan, Haoqiang and Liu, Shuaicheng},
  booktitle={Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition},
  pages={16263--16272},
  year={2022},
  url = {https://github.com/megvii-research/CREStereo}  
}

@inproceedings{MonoGS,
  title={{G}aussian {S}platting {SLAM}},
  author={Hidenobu Matsuki and Riku Murai and Paul H. J. Kelly and Andrew J. Davison},
  booktitle={Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition},
  year={2024},
  url = {https://github.com/muskie82/MonoGS}  
}

@misc{master,
      title={Grounding Image Matching in 3D with MASt3R}, 
      author={Vincent Leroy and Yohann Cabon and Jérôme Revaud},
      year={2024},
      eprint={2406.09756},
      archivePrefix={arXiv},
      primaryClass={cs.CV},
      url={https://arxiv.org/abs/2406.09756}, 
}

@misc{mvduster,
      title={MV-DUSt3R+: Single-Stage Scene Reconstruction from Sparse Views In 2 Seconds}, 
      author={Zhenggang Tang and Yuchen Fan and Dilin Wang and Hongyu Xu and Rakesh Ranjan and Alexander Schwing and Zhicheng Yan},
      year={2024},
      eprint={2412.06974},
      archivePrefix={arXiv},
      primaryClass={cs.CV},
      url={https://arxiv.org/abs/2412.06974}, 
}